import pandas as pd
import matplotlib
import numpy as np
import matplotlib.pyplot as plt
import matplotlib.dates as mdt
import seaborn as sns
import mplfinance
from pylab import rcParams
%matplotlib inline
import os
import warnings
warnings.filterwarnings('ignore')
from statsmodels.tsa.stattools import adfuller
from statsmodels.tsa.seasonal import seasonal_decompose
from statsmodels.tsa.arima_model import ARIMA
from pmdarima.arima import auto_arima
from sklearn.metrics import mean_squared_error, mean_absolute_error
import math


Prices = pd.read_csv("C:\\...\\Closing prices 2012-2021.csv", parse_dates=['Date'])
Prices['Date']= pd.to_datetime(Prices['Date'])
Prices = Prices.sort_values(by="Date")


Prices.set_index('Date', inplace = True)
Prices.index.name = None
Prices


Prices.describe()


PFE_short_term_EMA = Prices['Close PFE USD'].ewm(span=20, adjust=False).mean()
PFE_long_term_EMA = Prices['Close PFE USD'].ewm(span=200, adjust=False).mean()


fig, ax = plt.subplots(2, 1, figsize=(16,9))
ax[0].plot(Prices['Close PFE USD'], "cadetblue", label='PFE Close')
ax[0].plot(PFE_long_term_EMA, 'indianred', label='Long-term EMA')
ax[1].plot(Prices['Close PFE USD'], "cadetblue", label='PFE Close')
ax[1].plot(PFE_short_term_EMA, 'indianred', label='Short-term EMA')

ax[0].set_title('PFE Long-Term EMA')
ax[1].set_title('PFE Short-Term EMA')

ax[0].legend(loc='upper left', frameon=False)
ax[1].legend(loc='upper left', frameon=False)

plt.tight_layout()
sns.set(font_scale=1.5, style="whitegrid")


AZN_short_term_EMA = Prices['Close AZN USD'].ewm(span=20, adjust=False).mean()
AZN_long_term_EMA = Prices['Close AZN USD'].ewm(span=200, adjust=False).mean()


fig, ax = plt.subplots(2, 1, figsize=(16,9))
ax[0].plot(Prices['Close AZN USD'], "cadetblue", label='AZN Close')
ax[0].plot(AZN_long_term_EMA, 'indianred', label='Long-term EMA')
ax[1].plot(Prices['Close AZN USD'], "cadetblue", label='AZN Close')
ax[1].plot(AZN_short_term_EMA, 'darkorchid', label='Short-term EMA')

ax[0].set_title('AZN Long-Term EMA')
ax[1].set_title('AZN Short-Term EMA')

ax[0].legend(loc='upper left', frameon=False)
ax[1].legend(loc='upper left', frameon=False)

plt.tight_layout()
sns.set(font_scale=1.5, style="whitegrid")


NSDAQ_short_term_EMA = Prices['Close NSDAQ USD'].ewm(span=20, adjust=False).mean()
NSDAQ_long_term_EMA = Prices['Close NSDAQ USD'].ewm(span=250, adjust=False).mean()


fig, ax = plt.subplots(2, 1, figsize=(16,9))
ax[0].plot(Prices['Close NSDAQ USD'], "slategrey", label='NSDAQ Close')
ax[0].plot(NSDAQ_long_term_EMA, 'indianred', label='Long-term EMA')
ax[1].plot(Prices['Close NSDAQ USD'], "slategrey", label='NSDAQ Close')
ax[1].plot(NSDAQ_short_term_EMA, 'darkorchid', label='Short-term EMA')


ax[0].set_title('NSDAQ Long-Term EMA')
ax[1].set_title('NSDAQ Short-Term EMA')

ax[0].legend(loc='upper left', frameon=False)
ax[1].legend(loc='upper left', frameon=False)

plt.tight_layout()
sns.set(font_scale=1.5, style="whitegrid")


AAPL_short_term_EMA = Prices['Close AAPL USD'].ewm(span=20, adjust=False).mean()
AAPL_long_term_EMA = Prices['Close AAPL USD'].ewm(span=200, adjust=False).mean()


fig, ax = plt.subplots(2, 1, figsize=(16,9))
ax[0].plot(Prices['Close AAPL USD'], "slategrey", label='AAPL Close')
ax[0].plot(AAPL_long_term_EMA, 'indianred', label='Long-term EMA')
ax[1].plot(Prices['Close AAPL USD'], "slategrey", label='AAPL Close')
ax[1].plot(AAPL_short_term_EMA, 'darkorchid', label='Short-term EMA')

ax[0].set_title('AAPL Long-Term EMA')
ax[1].set_title('AAPL Short-Term EMA')

ax[0].legend(loc='upper left', frameon=False)
ax[1].legend(loc='upper left', frameon=False)

plt.tight_layout()
sns.set(font_scale=1.5, style="whitegrid")


NSRGF_short_term_EMA = Prices['Close NSRGF USD'].ewm(span=20, adjust=False).mean()
NSRGF_long_term_EMA = Prices['Close NSRGF USD'].ewm(span=200, adjust=False).mean()


fig, ax = plt.subplots(2, 1, figsize=(16,9))
ax[0].plot(Prices['Close NSRGF USD'], "darkseagreen", label='NSRGF Close')
ax[0].plot(NSRGF_long_term_EMA, 'indianred', label='Long-term EMA')
ax[1].plot(Prices['Close NSRGF USD'], "darkseagreen", label='NSRGF Close')
ax[1].plot(NSRGF_short_term_EMA, 'darkorchid', label='Short-term EMA')

ax[0].set_title('NSRGF Long-Term EMA')
ax[1].set_title('NSRGF Short-Term EMA')

ax[0].legend(loc='upper left', frameon=False)
ax[1].legend(loc='upper left', frameon=False)

plt.tight_layout()
sns.set(font_scale=1.5, style="whitegrid")


KO_short_term_EMA = Prices['Close KO USD'].ewm(span=20, adjust=False).mean()
KO_long_term_EMA = Prices['Close KO USD'].ewm(span=200, adjust=False).mean()


fig, ax = plt.subplots(2, 1, figsize=(16,9))
ax[0].plot(Prices['Close KO USD'], "darkseagreen", label='KO Close')
ax[0].plot(KO_long_term_EMA, 'indianred', label='Long-term EMA')
ax[1].plot(Prices['Close KO USD'], "darkseagreen", label='KO Close')
ax[1].plot(KO_short_term_EMA, 'darkorchid', label='Short-term EMA')

ax[0].set_title('KO Long-Term EMA')
ax[1].set_title('KO Short-Term EMA')

ax[0].legend(loc='upper left', frameon=False)
ax[1].legend(loc='upper left', frameon=False)

plt.tight_layout()
sns.set(font_scale=1.5, style="whitegrid")


fig, ax = plt.subplots(2, 1, figsize=(16,9))
ax[0].plot(Prices['Close AZN USD'], "cadetblue", label='AZN Close')
ax[0].set_title('AZN Price 2012 01-2021 12')
ax[1].plot(Prices['Close NSDAQ USD'], "slategrey", label='NSDAQ Close')
ax[1].set_title('NSDAQ Price 2012 01-2021 12')

ax[0].legend(loc='upper left', frameon=False)
ax[1].legend(loc='upper left', frameon=False)

plt.tight_layout()
sns.set(font_scale=1.5, style="whitegrid")


print("ADF p-value AZN:", adfuller(Prices['Close AZN USD'])[1])
print("ADF p-value NSDAQ:", adfuller(Prices['Close NSDAQ USD'])[1])

ADF p-value AZN: 0.7996286742279053
ADF p-value NSDAQ: 1.0


AZN_seasonality = seasonal_decompose(Prices['Close AZN USD'], model='additive', freq = 60)
fig = plt.figure()
fig = AZN_seasonality.plot().set_size_inches(16, 9)

<Figure size 432x288 with 0 Axes>


NSDAQ_seasonality = seasonal_decompose(Prices['Close NSDAQ USD'], model='additive', freq = 60)
fig = plt.figure()
fig = NSDAQ_seasonality.plot().set_size_inches(16, 9)

<Figure size 432x288 with 0 Axes>


rcParams['figure.figsize'] = 16, 9
AZN_log = np.log(Prices['Close AZN USD'])
MA = AZN_log.rolling(12).mean()
STD = AZN_log.rolling(12).std()

rcParams['figure.figsize'] = 16, 9
NSDAQ_log = np.log(Prices['Close NSDAQ USD'])
MA = NSDAQ_log.rolling(12).mean()
STD = NSDAQ_log.rolling(12).std()


train_AZN, test_AZN = AZN_log[0:int(len(AZN_log)*0.70)], AZN_log[int(len(AZN_log)*0.70):]
train_NSDAQ, test_NSDAQ = NSDAQ_log[0:int(len(NSDAQ_log)*0.90)], NSDAQ_log[int(len(NSDAQ_log)*0.90):]

plt.figure(figsize=(16,9))
plt.plot(AZN_log, 'cadetblue', label='AZN Train')
plt.plot(test_AZN, 'indianred', label='AZN Test')

plt.plot(NSDAQ_log, 'slategrey', label='NSDAQ Train')
plt.plot(test_NSDAQ, 'sandybrown', label='NSDAQ Test')
plt.legend(loc='upper left', frameon=False)

<matplotlib.legend.Legend at 0x26a511e96a0>


ARIMA_Model = auto_arima(train_AZN, start_p=0,start_q=0,test='adf', max_p=3, max_q=3, m=1, d=None, seasonal=False, start_P=0, D=0, 
              trace=True, error_action='ignore',suppress_warnings=True, stepwise=True)

Performing stepwise search to minimize aic
 ARIMA(0,1,0)(0,0,0)[0] intercept   : AIC=-9968.176, Time=0.21 sec
 ARIMA(1,1,0)(0,0,0)[0] intercept   : AIC=-9967.525, Time=0.23 sec
 ARIMA(0,1,1)(0,0,0)[0] intercept   : AIC=-9967.563, Time=0.20 sec
 ARIMA(0,1,0)(0,0,0)[0]             : AIC=-9969.487, Time=0.15 sec
 ARIMA(1,1,1)(0,0,0)[0] intercept   : AIC=-9965.028, Time=0.55 sec

Best model:  ARIMA(0,1,0)(0,0,0)[0]          
Total fit time: 1.355 seconds


AZN_ARIMA_Model = ARIMA(train_AZN, order=(0,1,0))
fitted_from_above_AZN= AZN_ARIMA_Model.fit()
fitted_from_above_AZN.summary()

C:\Users\Simona\anaconda3\lib\site-packages\statsmodels\tsa\base\tsa_model.py:581: ValueWarning: A date index has been provided, but it has no associated frequency information and so will be ignored when e.g. forecasting.
  warnings.warn('A date index has been provided, but it has no'
C:\Users\Simona\anaconda3\lib\site-packages\statsmodels\tsa\base\tsa_model.py:581: ValueWarning: A date index has been provided, but it has no associated frequency information and so will be ignored when e.g. forecasting.
  warnings.warn('A date index has been provided, but it has no'


ARIMA_Model = auto_arima(train_NSDAQ, start_p=0,start_q=0,test='adf', max_p=3, max_q=3, m=1, d=None, seasonal=False, start_P=0, D=0, 
              trace=True, error_action='ignore',suppress_warnings=True, stepwise=True)

Performing stepwise search to minimize aic
 ARIMA(0,1,0)(0,0,0)[0] intercept   : AIC=-12533.901, Time=0.30 sec
 ARIMA(1,1,0)(0,0,0)[0] intercept   : AIC=-12543.093, Time=0.33 sec
 ARIMA(0,1,1)(0,0,0)[0] intercept   : AIC=-12542.377, Time=0.26 sec
 ARIMA(0,1,0)(0,0,0)[0]             : AIC=-12530.647, Time=0.12 sec
 ARIMA(2,1,0)(0,0,0)[0] intercept   : AIC=-12543.945, Time=0.34 sec
 ARIMA(3,1,0)(0,0,0)[0] intercept   : AIC=-12547.461, Time=0.69 sec
 ARIMA(3,1,1)(0,0,0)[0] intercept   : AIC=-12554.554, Time=2.56 sec
 ARIMA(2,1,1)(0,0,0)[0] intercept   : AIC=-12541.666, Time=2.30 sec
 ARIMA(3,1,2)(0,0,0)[0] intercept   : AIC=-12547.410, Time=0.60 sec
 ARIMA(2,1,2)(0,0,0)[0] intercept   : AIC=-12539.425, Time=1.60 sec
 ARIMA(3,1,1)(0,0,0)[0]             : AIC=-12541.874, Time=0.46 sec

Best model:  ARIMA(3,1,1)(0,0,0)[0] intercept
Total fit time: 9.570 seconds


NSDAQ_ARIMA_Model = ARIMA(train_NSDAQ, order=(3,1,1))
fitted_from_above_NSDAQ= NSDAQ_ARIMA_Model.fit()
fitted_from_above_NSDAQ.summary()

C:\Users\Simona\anaconda3\lib\site-packages\statsmodels\tsa\base\tsa_model.py:581: ValueWarning: A date index has been provided, but it has no associated frequency information and so will be ignored when e.g. forecasting.
  warnings.warn('A date index has been provided, but it has no'
C:\Users\Simona\anaconda3\lib\site-packages\statsmodels\tsa\base\tsa_model.py:581: ValueWarning: A date index has been provided, but it has no associated frequency information and so will be ignored when e.g. forecasting.
  warnings.warn('A date index has been provided, but it has no'


fc1, se, conf = fitted_from_above_AZN.forecast(750, alpha=0.05) #error dėl index, turi būti 750?


forecast_series_AZN = pd.Series(fc1, index=test_AZN.index)
lower_series_AZN = pd.Series(conf[:, 0], index=test_AZN.index)
upper_series_AZN = pd.Series(conf[:, 0], index=test_AZN.index)


fc2, se, conf = fitted_from_above_NSDAQ.forecast(250, alpha=0.05) #error dėl index, turi būti 250?


forecast_series_NSDAQ = pd.Series(fc2, index=test_NSDAQ.index)
lower_series_NSDAQ = pd.Series(conf[:, 0], index=test_NSDAQ.index)
upper_series_NSDAQ = pd.Series(conf[:, 0], index=test_NSDAQ.index)


plt.plot(train_AZN, 'cadetblue', label='AZN Historical data')
plt.plot(test_AZN, color = 'indianred', label='AZN Stock Price')
plt.plot(forecast_series_AZN, color = 'green')

plt.plot(train_NSDAQ, 'slategrey', label='NSDAQ Historical data')
plt.plot(test_NSDAQ, color = 'sandybrown', label='NSDAQ Stock Price')
plt.plot(forecast_series_NSDAQ, color = 'green',label='Prediction')

plt.legend(loc='upper left', frameon=False)

<matplotlib.legend.Legend at 0x26a50d5fb80>


MAPE_AZN = np.mean(np.abs(fc1 - test_AZN)/np.abs(test_AZN))
MAPE_NSDAQ = np.mean(np.abs(fc2 - test_NSDAQ)/np.abs(test_NSDAQ))
print('MAPE AZN: '+str(MAPE_AZN))
print('MAPE NSDAQ: '+str(MAPE_NSDAQ))

MAPE AZN: 0.03651058508201623
MAPE NSDAQ: 0.03846177730169523

	Close PFE USD	Close NSDAQ USD	Close NSRGF USD	Close AAPL USD	Close AZN USD	Close KO USD
2012-01-03	21.48	24.96	58.25	14.69	23.86	35.07
2012-01-04	21.28	24.62	57.75	14.77	23.74	34.85
2012-01-05	21.11	24.66	57.20	14.93	23.43	34.69
2012-01-06	21.08	24.43	56.60	15.09	23.49	34.47
2012-01-09	21.33	24.33	57.41	15.06	23.29	34.47
...	...	...	...	...	...	...
2021-11-26	54.00	203.68	131.31	156.81	56.58	53.73
2021-11-29	52.40	209.08	131.30	160.24	55.53	54.58
2021-11-30	53.73	203.23	129.00	165.30	54.83	52.45
2021-12-01	54.68	199.03	127.57	164.77	54.88	52.30
2021-12-02	53.04	201.23	128.48	163.76	54.79	53.07

	Close PFE USD	Close NSDAQ USD	Close NSRGF USD	Close AAPL USD	Close AZN USD	Close KO USD
count	2497.000000	2497.000000	2497.000000	2497.000000	2497.000000	2497.000000
mean	33.252002	75.290224	84.917145	48.040521	36.423244	44.604537
std	5.767063	42.992460	18.819134	37.214999	10.341610	5.607982
min	20.480000	21.240000	55.800000	13.950000	20.020000	33.500000
25%	29.640000	39.920000	72.850000	23.610000	29.040000	40.600000
50%	33.280000	68.340000	77.600000	32.190000	34.280000	43.510000
75%	36.320000	95.130000	99.040000	53.060000	41.270000	47.630000
max	54.680000	212.830000	135.640000	165.300000	63.830000	60.130000

Dep. Variable:	D.Close AZN USD	No. Observations:	1746
Model:	ARIMA(0, 1, 0)	Log Likelihood	4986.088
Method:	css	S.D. of innovations	0.014
Date:	Sun, 05 Dec 2021	AIC	-9968.176
Time:	23:17:22	BIC	-9957.246
Sample:	1	HQIC	-9964.135

	coef	std err	z	P>\|z\|	[0.025	0.975]
const	0.0003	0.000	0.830	0.407	-0.000	0.001

Dep. Variable:	D.Close NSDAQ USD	No. Observations:	2246
Model:	ARIMA(3, 1, 1)	Log Likelihood	6283.278
Method:	css-mle	S.D. of innovations	0.015
Date:	Sun, 05 Dec 2021	AIC	-12554.556
Time:	23:17:32	BIC	-12520.254
Sample:	1	HQIC	-12542.035

Technical Stock Price Analysis with Exponential Moving Average (EMA) and Forecasting using ARIMA Model
¶

1. Data and Descriptive Statistics¶

1.1 Described Data¶

2. Exponentially Weighted Moving Average (EMA) Analysis by Sector¶

2.1 Healtch Care Sector: Short & Long Term EMA¶

2.2 Technology Sector: Short & Long Term EMA¶

2.3 Food Sector: Short & Long Term EMA¶

2.4 Interim Conclusions¶

3. Stock Price Foreacsting Autoregressive Integrated Moving Average: AZN and NSDAQ¶

3.1 Time Series Decomposition¶

3.2 Building ARIMA Model: AZN and NSDAQ¶

Conclusions¶

Analysis Limitations¶

For Further Analysis¶

	Real	Imaginary	Modulus	Frequency
AR.1	1.7133	-1.1476j	2.0621	-0.0939
AR.2	1.7133	+1.1476j	2.0621	0.0939
AR.3	-2.6858	-0.0000j	2.6858	-0.5000
MA.1	1.9910	+0.0000j	1.9910	0.0000

	coef	std err	z	P>\|z\|	[0.025	0.975]
const	0.0007	0.000	2.741	0.006	0.000	0.001
ar.L1.D.Close NSDAQ USD	0.4335	0.121	3.584	0.000	0.196	0.671
ar.L2.D.Close NSDAQ USD	0.0649	0.024	2.655	0.008	0.017	0.113
ar.L3.D.Close NSDAQ USD	-0.0876	0.021	-4.154	0.000	-0.129	-0.046
ma.L1.D.Close NSDAQ USD	-0.5023	0.120	-4.183	0.000	-0.738	-0.267

Technical Stock Price Analysis with Exponential Moving Average (EMA) and Forecasting using ARIMA Model ¶

1. Data and Descriptive Statistics¶

1.1 Described Data¶

2. Exponentially Weighted Moving Average (EMA) Analysis by Sector¶

2.1 Healtch Care Sector: Short & Long Term EMA¶

2.2 Technology Sector: Short & Long Term EMA¶

2.3 Food Sector: Short & Long Term EMA¶

2.4 Interim Conclusions¶

3. Stock Price Foreacsting Autoregressive Integrated Moving Average: AZN and NSDAQ¶

3.1 Time Series Decomposition¶

3.2 Building ARIMA Model: AZN and NSDAQ¶

Conclusions¶

Analysis Limitations¶

For Further Analysis¶

Technical Stock Price Analysis with Exponential Moving Average (EMA) and Forecasting using ARIMA Model
¶